import math
from matplotlib import pyplot as plt
import numpy as np
import random
from IPython.display import display, Math

SQU = lambda z: z + z**2
NCU = lambda z: z - z**3
sinc = lambda z: 1 if z == 0 else math.sin(z)/z
SSU = lambda z: math.pi*sinc(z - math.pi)

DSU = lambda z: (math.pi/2) *( sinc( z - math.pi) - sinc(z + math.pi))

_dsu = np.vectorize(DSU)
x = np.linspace(-50, 50, 100*5)
y = _dsu(x)

plt.plot(x, y)
plt.show()

var('x_1 x_2 theta_1 theta_2 y b')

(x_1, x_2, theta_1, theta_2, y, b)

hypo_1 = theta_1*x_1 + theta_2*x_2 + b

hypo_2 = ((pi/2) * (sin(hypo_1 - pi) / (hypo_1 - pi)) - (sin(hypo_1 + pi) / (hypo_1 + pi)))

j = (hypo_2 - y)**2

f = diff(j, theta_2)

Math(latex(simplify(f)))

hypo_2 = hypo_1 + hypo_1**2 # This is the SQU part

j = (hypo_2 - y)**2

f = diff(j, theta_1)

simplify(f)

2*((theta_1*x_1 + theta_2*x_2 + b)^2 + theta_1*x_1 + theta_2*x_2 + b - y)*(2*(theta_1*x_1 + theta_2*x_2 + b)*x_1 + x_1)

simplify(diff(j, theta_2))

2*((theta_1*x_1 + theta_2*x_2 + b)^2 + theta_1*x_1 + theta_2*x_2 + b - y)*(2*(theta_1*x_1 + theta_2*x_2 + b)*x_2 + x_2)

simplify(diff(j, b))

2*((theta_1*x_1 + theta_2*x_2 + b)^2 + theta_1*x_1 + theta_2*x_2 + b - y)*(2*theta_1*x_1 + 2*theta_2*x_2 + 2*b + 1)

hypo_1 = theta_1*x_1 + theta_2*x_2
hypo_2 = hypo_1 - hypo_1**3

Math(latex(diff(j, theta_2)))

Math(latex(simplify(f)))

X_control = np.random.uniform(size=[100, 2])
Y_control = np.sum(0.25*X_control, axis=1) + X_control[0][0]

def avg_loss(w: np.array, Xs: np.array, Ys: np.array):
    s = 0
    for x, y in zip(Xs, Ys):
        pred = SQU(w[0]*x[0] + w[1]*x[1] + w[2])
        s += (y-pred)**2
    return s / Ys.shape[0]

def squ_mse_gradient(w: np.array, x: np.array, y: float):
    l = w[0]*x[0] + w[1]*x[1] + w[2]
    g0 = 2*((l)^2 + l - y)*(2*(l)*x[0] + x[0])
    g1 = 2*((l)^2 + l - y)*(2*(l)*x[1] + x[1])
    g2 = 2*((l)^2 + l - y)*(2*w[0]*x[0] + 2*w[1]*x[1] + 2*w[2] + 1)
    # Without bias
    #g0 = 2*((l)**2 + l - y)*(2*(l)*x[1] + x[1]) 
    #g1 = 2*((l)**2 + l - y)*(2*(l)*x[0] + x[0])
    return np.array([g0, g1, g2])

def fit(X, Y, iterations=200, lr=0.001):
    w = np.array([1, 1, 1], dtype=np.float64)
    for _ in range(iterations):
        i = random.randint(0, Y.shape[0]-1)
        x, y= X[i], Y[i]
        a = squ_mse_gradient(w, x, y)
        w -= lr * a
    return w

weights = np.array([1, 1, 1], dtype=np.float64)
avg_loss(weights, X_control, Y_control)

31.4772287225186

weights = fit(X_control, Y_control)

avg_loss(weights, X_control, Y_control)

0.07734606914918682

# Gotta make sure to shift the thing so we can 
XOR = np.array([ [-1, -1], [-1, 1], [1, -1], [1, 1]])
YOR = np.array([ -1, 1, 1, -1])

weights = np.array([1, 1, 1], dtype=np.float64)
avg_loss(weights, XOR, YOR)

43.0

weights = fit(XOR, YOR, iterations=2000)

avg_loss(weights, XOR, YOR)

0.49727671369496174

for i, ii in zip(XOR, YOR):
    print(i, '->', SQU(weights[0]*i[0] + weights[1]*i[1] + weights[2]) > 0)

[-1 -1] -> False
[-1  1] -> True
[ 1 -1] -> True
[1 1] -> False

Biologically Inspired Oscilating Activation Functions Can Bridge the Performance Gap Between Biological and Artificial Neurons¶

General Reasoning¶

Oscillating Activation Functions¶

Making Activation Functions Useful¶

Results¶

Afterthoughts¶

Correlation To Fractal Noise¶

Re-Implementation¶

Quick re-deriviation of SGD using MSE on Oscilating Functions¶

DSU¶

SQU¶

NCU¶

Actually Doing SGD Now¶

Fitting XOR¶